'''
* This is the projet for Brtc LlmOps Platform
* @Author Leon-liao <liaosiliang@alltman.com>
* @Description //TODO 
* @File: 3_study_excel_loader.py
* @Time: 2025/8/20
* @All Rights Reserve By Brtc
'''
from langchain_community.document_loaders import UnstructuredExcelLoader, UnstructuredPowerPointLoader, \
    UnstructuredWordDocumentLoader

#excle_loader = UnstructuredExcelLoader("./test.xlsx")
#ppt_loader = UnstructuredPowerPointLoader("./博睿智启公开课第二次.pptx")
word_laoader = UnstructuredWordDocumentLoader("./介绍.docx")
docs = word_laoader.load()

print(docs)
print(len(docs))
print(docs[0].metadata)